# utils/config.py
"""
RAG系统配置
"""

# 嵌入模型配置
EMBEDDING_MODELS = {
    "chinese_small": "BAAI/bge-small-zh",
    "chinese_large": "BAAI/bge-large-zh",
    "multilingual": "sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2"
}

# 文本分割配置
TEXT_SPLITTER_CONFIG = {
    "chunk_size": 500,
    "chunk_overlap": 50,
    "separators": ["\n\n", "\n", "。", "！", "？", "；", "，", " "]
}

# 检索配置
RETRIEVER_CONFIG = {
    "search_type": "similarity",
    "search_kwargs": {"k": 3}
}

# 支持的文档格式
SUPPORTED_FORMATS = ['.txt', '.pdf', '.md']